#!/usr/bin/env python
# $Id: test2-17.py df54dec975f4 2012/09/09 20:22:40 pgurumur $
# Copyright (c) 2012 Prabhu Gurumurthy <pgurumur@gmail.com>
#
# Permission to use, copy, modify, and distribute this software for any
# purpose with or without fee is hereby granted, provided that the above
# copyright notice and this permission notice appear in all copies.
#
# THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
# WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
# MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
# ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
# WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
# ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
# OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
#

__version__  = "$Revision: df54dec975f4 $"
__author__   = "$Author: pgurumur $"
__modified__ = "$Date: 2012-09-09 20:22:40Z $"

import urllib2
import sys

from StringIO import StringIO
from lxml import etree


class Target(object):
   def __init__(self):
      self._capture = False

   def start(self, tag, attr):
      if tag  == "em":
         self._capture = True

   def end(self, tag):
      self._capture = False

   def data(self, data):
      if self._capture:
         try:
            print(data)
         except UnicodeEncodeError:
            pass

if __name__ == "__main__":
   package = sys.argv[1]
   if package:
      try:
         urldata = urllib2.urlopen(
               "http://openports.se/search.php?stype=folder&so=%s" %package)
      except URLError, message:
         print "errror"
         sys.exit(1)
      else:
         parser = etree.HTMLParser(target = Target())
         tree = etree.parse(StringIO(urldata.read()), parser)
